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SEQUENCE LISTING 

<110> ADLER, JON ELLIOT 
ZOZULYA, SERGEY 
LI, XIADONG 
O 1 CONNELL , SHAWN 
STASZEWSKI, LENA 



o 



<12 0> T1R TASTE RECEPTORS AND GENES ENCODING SAME 
<130> 0780'03/0277870/RXT 



<140> 09/799,629 
<141> 2001-03-07 

<150> 60/187,546 
<151> 2000-03-07 

<150> 60/195,536 
<151> 2000-04-07 

<150> 60/209,840 
<151> 2000-06-06 

<150> 60/214,213 
<151> 2000-06-23 

<150> 30/226,448 
<151> 2000-08-17 

<150> 60/259,227 
<151> 2001-01-03 

<160> 20 



<170> Patentln Ver. 2.1 



<210> 1 

<211> 876 

<212> DNA 

<213> Homo sapiens 



<400> 1 

agcctggcag 

ggacaccact 

tcctctgccc 

ctgccgtgcc 

ctctgggctc 

atgaaggggg 

ctccgcagcc 

tgggtcgggg 

ctgcggttct 

aaatggccgt 

acgacctctt 

tggccaaggc 

gtgtgctggc 

tcagcttctt 

cctgccccgt 



tggcctcagg 
ggggccccag 
gctccccgcc 
tgttggaagt 
tcctgcaccc 
actacgtgct 
ggacacggcc 
tcagggtgac 
gtgtggcccc 
ggaggagatc 
tgatacgtgc 
aggcagccgc 
tgtcatcggg 
cctcatgccc 
gggagcccct 



cagagtctga 
ggtgtggcaa 
ccgggctcac 
tgcctctgcc 
tgggacgggg 

gggggggctg 

cagcagccct 
caggtctggg 
aggttctcct 
aacaacaagt 
tcggagcctg 
gacatcgccg 
ccccactcgt 
cagtggggcg 
tgtgtcagga 



cgcgcacaaa 
gtgaggatgg 
tccatgtgag 
atgctgggcc 
gccccattgt 
ttccccctgg 
gtgtgcacca 
gtgctcctga 
caaacggcct 
cggatctgct 
tggtggccat 
cctactgcaa 
cagagctcgc 
ccccccacca 
gaatgc 



ctttcaggcc 
caagggtttt 
gccccagtcg 
ctgctgtcct 
gcctgtcaca 
gcgaggccga 
ggtacagagg 
gctggggccg 
gctctgggca 
gcccgggctg 
gaagcccagc 
ctacacgcag 
catggtcacc 
tcacccaccc 



caggaagcga 
gctaaacaaa 
gggcagccac 
gggcctcagc 
gcaacttagg 
ggaggctggc 
tgggacggcc 
aggtggccat 
ctggccatga 
cgcctgggct 
ctcatgttcc 
taccagcccc 
ggcaagttct 
ccaaccaacc 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

876 



o o 



<210> 2 

<211> 2687 

<212> DNA 

<213> Homo sapiens 

<400> 2 

tacatgcacc ccacccagcc ctgccctggg agccctgtgt cagaagatgc tcttggcctt 60 
gcaggtcagc tacggtgcta gcatggagct gctgagcgcc cgggagacct tcccctcctt 120 
cttccgcacc gtgcccagcg accgtgtgca gctgacggcc gccgcggagc tgctgcagga 180 
gttcggctgg aactgggtgg ccgccctggg cagcgacgac gagtacggcc ggcagggcct 240 
gagcatcttc tcggccotgg ccgcggcacg cggcatctgc atcgcgcacg agggcctggt J 300 
gccgctgccc cgtgccgatg actcgcggct ggggaaggtg caggacgtcc tgcaccaggt 360 
gaaccagagc agcgtgcagg tggtgctgct gttcgcctcc gtgcacgccg cccacgccct 420 
cttcaactac agcatcagca gcaggctctc gcccaaggtg tgggtggcca gcgaggcctg 480 
gctgacctct gacctggtca tggggctgcc cggcatggcc cagatgggca cggtgcttgg 540 
cttcctccag aggggtgccc agctgcacga gttcccccag tacgtgaaga cgcacctggc 600 
cctggccacc gacccggcct tctgctctgc cctgggcgag agggagcagg gtctggagga 660 
ggacgtggtg ggccagcgct gcccgcagtg tgactgcatc acgctgcaga acgtgagcgc 720 
agggctaaat caccaccaga cgttctctgt ctacgcagct gtgtatagcg tggcccaggc 780 
cctgcacaac actcttcagt gcaacgcctc aggctgcccc gcgcaggacc ccgtgaagcc 84 0 
ctggcaggtg agcccgggag atgggggtgt gctgtcctct gcatgtgccc aggccaccag 900 
gcacggccac cacgcctgag ctggaggtgg ctggcggctc agccccgtcc cccgcccgca 960 
gctcctggag aacatgtaca acctgacctt ccacgtgggc gggctgccgc tgcggttcga 1020 
cagcagcgga aacgtggaca tggagtacga cctgaagctg tgggtgtggc agggctcagt 1080 
gcccaggctc cacgacgtgg gcaggttcaa cggcagcctc aggacagagc gcctgaagat 1140 
ccgctggcac acgtctgaca accaggtgag gtgagggtgg gtgtgccagg cgtgcccgtg 1200 
gtagcccccg cggcagggcg cagcctgggg gtgggggccg ttccagtctc ccgtgggcat 12 60 
gcccagccga gcagagccag accccaggcc tgtgcgcaga agcccgtgtc ccggtgctcg 132 0 
cggcagtgcc aggagggcca ggtgcgccgg gtcaaggggt tccactcctg ctgctacgac 1380 
tgtgtggact gcgaggcggg cagctaccgg caaaacccag gtgagccgcc ttcccggcag 1440 
9 c 99999tgg gaacgcagca ggggagggtc ctgccaagtc ctgactctga gaccagagcc 1500 
cacagggtac aagacgaaca cccagcgccc ttctcctctc tcacagacga catcgcctgc 1560 
accttttgtg gccaggatga gtggtccccg gagcgaagca cacgctgctt ccgccgcagg 1620 
tctcggttcc tggcatgggg cgagccggct gtgctgctgc tgctcctgct gctgagcctg 1680 
gcgctgggcc ttgtgctggc tgctttgggg ctgttcgttc accatcggga cagcccactg 1740 
gttcaggcct cgggggggcc cctggcctgc tttggcctgg tgtgcctggg cctggtctgc 1800 
ctcagcgtcc tcctgttccc tggccagccc agccctgccc gatgcctggc ccagcagccc 1860 
ttgtcccacc tcccgctcac gggctgcctg agcacactct tcctgcaggc ggccgagatc 1920 
ttcgtggagt cagaactgcc tctgagctgg gcagaccggc tgagtggctg cctgcggggg 1980 
ccctgggcct ggctggtggt gctgctggcc atgctggtgg aggtcgcact gtgcacctgg 2040 
tacctggtgg ccttcccgcc ggaggtggtg acggactggc acatgctgcc cacggaggcg 2100 
ctggtgcact gccgcacacg ctcctgggtc agcttcggcc tagcgcacgc caccaatgcc 2160 
acgctggcct ttctctgctt cctgggcact ttcctggtgc ggagccagcc gggctgctac 2220 
aaccgtgccc gtggcctcac ctttgccatg ctggcctact tcatcacctg ggtctccttt 2280 
gtgcccctcc tggccaatgt gcaggtggtc ctcaggcccg ccgtgcagat gggcgccctc 2340 
ctgctctgtg tcctgggcat cctggctgcc ttccacctgc ccaggtgtta cctgctcatg 2400 
cggcagccag ggctcaacac ccccgagttc ttcctgggag ggggccctgg ggatgcccaa 2460 
ggccagaatg acgggaacac aggaaatcag gggaaacatg agtgacccaa ccctgtgatc 2520 
tcagccccgg tgaacccaga cttagctgcg atccccccca agccagcaat gacccgtgtc 2580 
tcgctacaga gaccctcccg ctctaggttc tgaccccagg ttgtctcctg accctgaccc 2640 
cacagtgagc cctaggcctg gagcacgtgg acacccctgt gaccatc 2687 



<210> 3 
<211> 2553 



n 



o 



<212> DNA 

<213> Homo sapiens 



<400> 3 

atgctgggcc 

gccccattgt 

ttccccctgg 

gtgtgcacca 

gaggagatca 

gatacgtgct 

ggcagccgcg 

gtcatcgggc 

ctcatgcccc 

ttcttccgca 

gagttcggct 

ctgagcatct 

gtgccgctgc 

gtgaaccaga 

ctcttcaact 

tggctgacct 

ggcttcctcc 

gccctggcca 

gaggacgtgg 

gcagggctaa 

gccctgcaca 

ccctggcagc 

cggttcgaca 

ggctcagtgc 

ctgaagatcc 

tgccaggagg 

gactgcgagg 

caggatgagt 

gcatggggcg 

gtgctggctg 

ggggggcccc 

ctgttccctg 

ccgctcacgg 

gaactgcctc 

ctggtggtgc 

ttcccgccgg 

cgcacacgct 

ctctgcttcc 

ggcctcacct 

gccaatgtgc 

ctgggcatcc 

ctcaacaccc 

gggaacacag 



ctgctgtcct 
gcctgtcaca 
gcgaggccga 
ggttctcctc 
acaacaagtc 
cggagcctgt 
acatcgccgc 
cccactcgtc 
actacggtgc 
ccgtgcccag 
ggaactgggt 
tctcggccct 
cccgtgccga 
gcagcgtgca 
acagcatcag 
ctgacctggt 
agaggggtgc 
ccgacccggc 
tgggccagcg 
atcaccacca 
acactcttca 
tcctggagaa 
gcagcggaaa 
ccaggctcca 
gctggcacac 
gccaggtgcg 
cgggcagcta 
ggtccccgga 
agccggctgt 
ctttggggct 
tggcctgctt 
gccagcccag 
gctgcctgag 
tgagctgggc 
tgctggccat 
aggtggtgac 
cctgggtcag 
tgggcacttt 
ttgccatgct 
aggtggtcct 
tggctgcctt 
ccgagttctt 
gaaatcaggg 



gggcctcagc 
gcaacttagg 
ggaggctggc 
aaacggcctg 
ggatctgctg 
ggtggccatg 
ctactgcaac 
agagctcgcc 
tagcatggag 
cgaccgtgtg 
ggccgccctg 
ggccgcggca 
tgactcgcgg 
ggtggtgctg 
cagcaggctc 
catggggctg 
ccagctgcac 
cttctgctct 
ctgcccgcag 
gacgttctct 
gtgcaacgcc 
catgtacaac 
cgtggacatg 
cgacgtgggc 
gtctgacaac 
ccgggtcaag 
ccggcaaaac 
gcgaagcaca 
gctgctgctg 
gttcgttcac 
tggcctggtg 
ccctgcccga 
cacactcttc 
agaccggctg 
gctggtggag 
ggactggcac 
cttcggccta 
cctggtgcgg 
ggcctacttc 
caggcccgcc 
ccacctgccc 
cctgggaggg 
gaaacatgag 



ctctgggctc 
atgaaggggg 
ctccgcagcc 
ctctgggcac 
cccgggctgc 
aagcccagcc 
tacacgcagt 
atggtcaccg 
ctgctgagcg 
cagctgacgg 
ggcagcgacg 
cgcggcatct 
ctggggaagg 
ctgttcgcct 
tcgcccaagg 
cccggcatgg 
gagttccccc 
gccctgggcg 
tgtgactgca 
gtctacgcag 
tcaggctgcc 
ctgaccttcc 
gagtacgacc 
aggttcaacg 
cagaagcccg 
gggttccact 
ccagacgaca 
cgctgcttcc 
ctcctgctgc 
catcgggaca 
tgcctgggcc 
tgcctggccc 
ctgcaggcgg 
agtggctgcc 
gtcgcactgt 
atgctgccca 
gcgcacgcca 
agccagccgg 
atcacctggg 
gtgcagatgg 
aggtgttacc 
ggccctgggg 
tga 



tcctgcaccc 
actacgtgct 
ggacacggcc 
tggccatgaa 
gcctgggcta 
tcatgttcct 
accagccccg 
gcaagttctt 
cccgggagac 
ccgccgcgga 
acgagtacgg 
gcatcgcgca 
tgcaggacgt 
ccgtgcacgc 
tgtgggtggc 
cccagatggg 
agtacgtgaa 
agagggagca 
tcacgctgca 
ctgtgtatag 
ccgcgcagga 
acgtgggcgg 
tgaagctgtg 
gcagcctcag 
tgtcccggtg 
cctgctgcta 
tcgcctgcac 
gccgcaggtc 
tgagcctggc 
gcccactggt 
tggtctgcct 
agcagccctt 
ccgagatctt 
tgcgggggcc 
gcacctggta 
cggaggcgct 
ccaatgccac 
gctgctacaa 
tctcctttgt 
gcgccctcct 
tgctcatgcg 
atgcccaagg 



tgggacgggg 
gggggggctg 
cagcagccct 
aatggccgtg 
cgacctcttt 
ggccaaggca 
tgtgctggct 
cagcttcttc 
cttcccctcc 
gctgctgcag 
ccggcagggc 
cgagggcctg 
cctgcaccag 
cgcccacgcc 
cagcgaggcc 
cacggtgctt 
gacgcacctg 
gggtctggag 
gaacgtgagc 
cgtggcccag 
ccccgtgaag 
gctgccgctg 
ggtgtggcag 
gacagagcgc 
ctcgcggcag 
cgactgtgtg 
cttttgtggc 
tcggttcctg 
gctgggcctt 
tcaggcctcg 
cagcgtcctc 
gtcccacctc 
cgtggagtca 
ctgggcctgg 
cctggtggcc 
ggtgcactgc 
gctggccttt 
ccgtgcccgt 
gcccctcctg 
gctctgtgtc 
gcagccaggg 
ccagaatgac 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2553 



<210> 4 

<211> 850 

<212> PRT 

<213> Homo sapiens 



<400> 4 

Met Leu Gly Pro Ala Val Leu Gly Leu Ser Leu Trp Ala Leu Leu His 
1 5 10 15 



o o 



Pro Gly Thr Gly Ala Pro Leu Cys Leu Ser Gin Gin Leu Arg Met Lys 
20 25 30 

Gly Asp Tyr Val Leu Gly Gly Leu Phe Pro Leu Gly Glu Ala Glu Glu 
35 40 45 

Ala Gly Leu Arg Ser Arg Thr Arg Pro Ser Ser Pro Val Cys Thr Arg 
50 55 60 

Phe Ser Ser Asn Gly Leu Leu Trp Ala Leu Ala Met Lys Met Ala Val 
65 70 75 80 

Glu Glu lie Asn Asn Lys Ser Asp Leu Leu Pro Gly Leu Arg Leu Gly 
85 90 95 

Tyr Asp Leu Phe Asp Thr Cys Ser Glu Pro Val Val Ala Met Lys Pro 
100 105 110 

Ser Leu Met Phe Leu Ala Lys Ala Gly Ser Arg Asp lie Ala Ala Tyr 
115 120 125 

Cys Asn Tyr Thr Gin Tyr Gin Pro Arg Val Leu Ala Val lie Gly Pro 
130 * 135 140 

His Ser Ser Glu Leu Ala Met Val Thr Gly Lys Phe Phe Ser Phe Phe 
145 150 155 160 

Leu Met Pro His Tyr Gly Ala Ser Met Glu Leu Leu Ser Ala Arg Glu 
165 170 175 

Thr Phe Pro Ser Phe Phe Arg Thr Val Pro Ser Asp Arg Val Gin Leu 
180 185 190 

Thr Ala Ala Ala Glu Leu Leu Gin Glu Phe Gly Trp Asn Trp Val Ala 
195 200 205 

Ala Leu Gly Ser Asp Asp Glu Tyr Gly Arg Gin Gly Leu Ser lie Phe 
210 215 220 

Ser Ala Leu Ala Ala Ala Arg Gly lie Cys lie Ala His Glu Gly Leu 
225 230 235 240 

Val Pro Leu Pro Arg Ala Asp Asp Ser Arg Leu Gly Lys Val Gin Asp 
245 250 255 

Val Leu His Gin Val Asn Gin Ser Ser Val Gin Val Val Leu Leu Phe 
260 265 270 

Ala Ser Val His Ala Ala His Ala Leu Phe Asn Tyr Ser lie Ser Ser 
275 280 285 

Arg Leu Ser Pro Lys Val Trp Val Ala Ser Glu Ala Trp Leu Thr Ser 
290 295 300 



Asp Leu Val Met Gly Leu Pro Gly Met Ala Gin Met Gly Thr Val Leu 
305 310 315 320 



o o 



Gly Phe Leu Gin Arg Gly Ala Gin Leu His Glu Phe Pro Gin Tyr Val 
325 330 335 

Lys Thr His Leu Ala Leu Ala Thr Asp Pro Ala Phe Cys Ser Ala Leu 
340 345 350 

Gly Glu Arg Glu Gin Gly Leu Glu Glu Asp Val Val Gly Gin Arg Cys 
355 360 365 

Pro Gin Cys Asp Cys He Thr Leu Gin Asn Val Ser Ala Gly Leu Asn 
370 375 380 

His His Gin Thr Phe Ser Val Tyr Ala Ala Val Tyr Ser Val Ala Gin 
385 390 395 400 

Ala Leu His Asn Thr Leu Gin Cys Asn Ala Ser Gly Cys Pro Ala Gin 
405 410 415 

Asp Pro Val Lys Pro Trp Gin Leu Leu Glu Asn Met Tyr Asn Leu Thr 
420 425 430 

Phe His Val Gly Gly Leu Pro Leu Arg Phe Asp Ser Ser Gly Asn Val 
435 440 445 

Asp Met Glu Tyr Asp Leu Lys Leu Trp Val Trp Gin Gly Ser Val Pro 
450 455 460 

Arg Leu His Asp Val Gly Arg Phe Asn Gly Ser Leu Arg Thr Glu Arg 
465 470 475 480 

Leu Lys He Arg Trp His Thr Ser Asp Asn Gin Lys Pro Val Ser Arg 
485 490 495 

Cys Ser Arg Gin Cys Gin Glu Gly Gin Val Arg Arg Val Lys Gly Phe 
500 505 510 

His Ser Cys Cys Tyr Asp Cys Val Asp Cys Glu Ala Gly Ser Tyr Arg 
515 520 525 

Gin Asn Pro Asp Asp He Ala Cys Thr Phe Cys Gly Gin Asp Glu Trp 
530 535 540 

Ser Pro Glu Arg Ser Thr Arg Cys Phe Arg Arg Arg Ser Arg Phe Leu 
545 • 550 555 560 

Ala Trp Gly Glu Pro Ala Val Leu Leu Leu Leu Leu Leu Leu Ser Leu 
565 570 575 

Ala Leu Gly Leu Val Leu Ala Ala Leu Gly Leu Phe Val His His Arg 
580 585 590 

Asp Ser Pro Leu Val Gin Ala Ser Gly Gly Pro Leu Ala Cys Phe Gly 
595 600 605 



Leu Val Cys Leu Gly Leu Val Cys Leu Ser Val Leu Leu Phe Pro Gly 
610 615 620 



o 



Gin Pro Ser Pro Ala Arg Cys Leu Ala Gin Gin Pro Leu Ser His Leu 

625 630 635 640 

Pro Leu Thr Gly Cys Leu Ser Thr Leu Phe Leu Gin Ala Ala Glu lie 

645 650 655 

Phe Val Glu Ser Glu Leu Pro Leu Ser Trp Ala Asp Arg Leu Ser Gly 

660 665 670 

Cys Leu Arg Gly Pro Trp Ala Trp Leu Val Val Leu Leu Ala Met Leu 

675 680 685 

Val Glu Val Ala Leu Cys Thr Trp Tyr Leu Val Ala Phe Pro Pro Glu 

690 695 700 

Val Val Thr Asp Trp His Met Leu Pro Thr Glu Ala Leu Val His Cys 

705 710 715 720 

Arg Thr Arg Ser Trp Val Ser Phe Gly Leu Ala His Ala Thr Asn Ala 

725 730 735 

Thr Leu Ala Phe Leu Cys Phe Leu Gly Thr Phe Leu Val Arg Ser Gin 

740 745 . 750 

Pro Gly Cys Tyr Asn Arg Ala Arg Gly Leu Thr Phe Ala Met Leu Ala 

755 760 765 

Tyr Phe lie Thr Trp Val Ser Phe Val Pro Leu Leu Ala Asn Val Gin 

770 775 780 

Val Val Leu Arg Pro Ala Val Gin Met Gly Ala Leu Leu Leu Cys Val 

785 790 795 800 

Leu Gly lie Leu Ala Ala Phe His Leu Pro Arg Cys Tyr Leu Leu Met 

805 810 815 



Arg Gin Pro Gly Leu Asn Thr Pro Glu Phe Phe Leu Gly Gly Gly Pro 
820 825 830 

Gly Asp Ala Gin Gly Gin Asn Asp Gly Asn Thr Gly Asn Gin Gly Lys 
835 840 845 

His Glu 
850 



<210> 5 
<211> 23 
<212> DNA 

<213> Artificial Sequence 
<220> 

<221> modif ied_base 
<222> (3) 

<223> a, c, t, g, other or unknown 
<220> 

<221> modified base 



o 



<222> (9) 

<223> a, c, t, g, other or unknown 
<220> 

<221> modif ied__base 
<222> (12) 

<223> a, c, t, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (18) 

<223> a, c, t, g, other or unknown 
<220> 

<223> Description of Artificial Sequence: Primer 
<400> 5 

cgnttyytng cntggggnga rcc 



<210> 6 
<211> 23 
<212> DNA 

<213> Artificial Sequence 
<220> 

<221> modif ied_base 
<222> (3) 

<223> a, c, t, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (6) 

<223> a, c, t, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (18) 

<223> a, c, t, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (21) 

<223> a, c, t, g, other or unknown 
<220> 

<223> Description of Artificial Sequence: Primer 
<400> 6 

cgngcncgrt trtarcancc ngg 



<210> 7 

<211> 9 

<212> PRT 

<213> Homo sapiens 



0 



8 

<400> 7 

Arg Phe Leu Ala Trp Gly Glu Pro Ala 
1 5 



<210> 8 
<211> 8 
<212> PRT 

<213> Homo sapiens 
<400> 8 

Pro Gly Cys Tyr Asn Arg Ala Arg 
1 5 



<210> 9 
<211> 552 
<212> DNA 
<213> Mus sp. 



<400> 9 

gtgctgtcac 

ctctctgtcc 

tttggcctga 

agctctgcca 

agcacactct 

gcaaactggc 

tttgtggagg 

tggtcagtgc 

ggcttggtgc 
gtacaagacc 



tcctcctgct 
accactggga 
tctgcctagg 
gctgccttgc 
tcctgcaagc 
tatgcagcta 
cagcactatg 
tgcccacaga 
acatcaccaa 
ag 



gctttgcctg 
cagccctctt 
cctcttctgc 
acaacaacca 
agctgagacc 
ccttcgggac 
tgcctggtat 
ggtactggag 
tgcaatggta 



gtgctgggtc 
gtccaggcct 
ctcagtgtcc 
atggctcacc 
tttgtggagt 
tctggcctgc 
ttgaccgctt 
cactgccacg 
gcttttctct 



tagcactggc 
caggcggctc 
ttctgttccc 
tccctctcac 
ctgagctgcc 
tagtggtact 
caccagaagt 
tgcgttcctg 
gctttctggg 



tgctctgggg 60 
acagttctgc 120 
aggacggcca 180 
aggctgcctg 240 
actgagctgg 3 00 
gttggccact 360 
ggtgacagac 420 
ggtcaacctg 4 80 
cactttcctg 540 
552 



<210> 10 

<211> 184 

<212> PRT 

<213> Mus sp. 

<400> 10 
Val Leu Ser Leu 
1 

Ala Ala Leu Gly 
20 

Ala Ser Gly Gly 
35 

Phe Cys Leu Ser 
50 

Cys Leu Ala Gin 
65 

Ser Thr Leu Phe 



Leu Leu Leu Leu 
5 

Leu Ser Val His 



Ser Gin Phe Cys 
40 

Val Leu Leu Phe 
55 

Gin Pro Met Ala 
70 

Leu Gin Ala Ala 
85 



Cys Leu Val Leu 
10 

His Trp Asp Ser 
25 

Phe Gly Leu lie 



Pro Gly Arg Pro 
60 

His Leu Pro Leu 
75 

Glu Thr Phe Val 
90 



Gly Leu Ala Leu 
15 

Pro Leu Val Gin 
30 

Cys Leu Gly Leu 
45 

Ser Ser Ala Ser 



Thr Gly Cys Leu 
80 

Glu Ser Glu Leu 
95 



o o 



Pro Leu Ser Trp Ala Asn Trp Leu Cys Ser Tyr Leu Arg Asp Ser Gly 
100 105 110 

Leu Leu Val Val Leu Leu Ala Thr Phe Val Glu Ala Ala Leu Cys Ala 
115 120 125 

Trp Tyr Leu Thr Ala Ser Pro Glu Val Val Thr Asp Trp Ser Val Leu 
130 135 140 

Pro Thr Glu Val Leu Glu His Cys His Val Arg Ser Trp Val Asn Leu 
145 150 155 160 

Gly Leu Val His He Thr Asn Ala Met Val Ala Phe Leu Cys Phe Leu 
165 170 175 

Gly Thr Phe Leu Val Gin Asp Gin 
180 



<210> 11 
<211> 558 
<212> DNA 
<213> Rattus sp. 



<400> 11 

gtgctgtcac 

ctctttgtcc 

tttggcctga 

cgctctgcca 

agcacactct 

gcaaactggc 

actcttgtgg 

acagattggc 

agcctgggct 

ttcctggtac 



ttctcctgct 
actactggga 
tctgcctagg 
gctgccttgc 
tcctgcaagc 
tctgcagcta 
aggctgcact 
aggtgctgcc 
tggtgcacat 
aaagccag 



gctttgcctg 
cagccctctt 
cctcttctgc 
ccaacaacca 
agccgagatc 
ccttcggggc 
atgtgcctgg 
cacggaggta 
caccaatgca 



gtgctgggcc 
gttcaggcct 
ctcagtgtcc 
atggctcacc 
tttgtggagt 
ccctgggctt 
tacttgatgg 
ctggaacact 
ggggtagctt 



tgacactggc 
caggtgggtc 
ttctgttccc 
tccctctcac 
ctgagctgcc 
ggctggtggt 
ctttccctcc 
gccgcatgcg 
tcctctgctt 



tgccctgggg 
actgttctgc 
aggacgacca 
aggctgcctg 
actgagttgg 
actgctggcc 
agaggtggtg 
ttcctgggtc 
tctgggcact 



60 

120 

180 

240 

300 

360 

420 

480 

540 

558 



<210> 12 
<211> 186 
<212> PRT 
<213> Rattus sp. 

<400> 12 

Val Leu Ser Leu Leu Leu Leu Leu Cys Leu Val Leu Gly Leu Thr Leu 
1 5 10 15 

Ala Ala Leu Gly Leu Phe Val His Tyr Trp Asp Ser Pro Leu Val Gin 
20 25 30 

Ala Ser Gly Gly Ser Leu Phe Cys Phe Gly Leu He Cys Leu Gly Leu 
35 40 45 



Phe Cys Leu Ser Val Leu Leu Phe Pro Gly Arg Pro Arg Ser Ala Ser 
50 55 60 



Cys Leu Ala Gin Gin Pro Met Ala His Leu Pro Leu Thr Gly Cys Leu 
65 70 75 80 



oo 



no 



10 

Ser Thr Leu Phe Leu Gin Ala Ala Glu lie Phe Val Glu Ser Glu Leu 
85 90 95 

Pro Leu Ser Trp Ala Asn Trp Leu Cys Ser Tyr Leu Arg Gly Pro Trp 
100 105 110 

Ala Trp Leu Val Val Leu Leu Ala Thr Leu Val Glu Ala Ala Leu Cys 
115 . 120 125 

Ala Trp Tyr Leu Met Ala Phe Pro Pro Glu Val Val Thr Asp Trp Gin 
130 135 140 

Val Leu Pro Thr Glu Val Leu Glu His Cys Arg Met Arg Ser Trp Val 
145 150 155 160 

Ser Leu Gly Leu Val His lie Thr Asn Ala Gly Val Ala Phe Leu Cys 
165 170 175 

Phe Leu Gly Thr Phe Leu Val Gin Ser Gin 
180 185 



<210> 13 
<211> 2577 
<212> DNA 
<213> Rattus sp. 



<400> 13 

atgccgggtt 

tcctctttgt 

tttcccctgg 

ctatgtacca 

gaggagatca 

gacacatgct 

ggaagtcaaa 

gtcattggtc 

ctcatgccac 

ccatccttct 

ttgcagaatt 

gaaggtctga 

ggcctggtgc 

cgccaagtga 

tactcccttt 

gagtcctggc 

gttcttgggt 

cgccttgccc 

gaggagcgcg 

tcatctgggc 

tatgcagctg 

cattgccaca 

agtttccgtg 

tatgacctga 

ttcaacggca 

gtctcccagt 

tcctgctgct 

ttcacctgta 

cctcgcaggc 

ctttgcctgg 



tggctatctt 
gtctgtcaca 
gcacaactga 
ggttctcgcc 
acaatggatc 
cagagccagt 
gcattgctgc 
cccactcatc 
aggtcagcta 
tccgcacagt 
tcagctggaa 
gcatcttttc 
cacaacatga 
accaaagcaa 
ttagctacag 
tgacctctga 
ttctgcagcg 
tagctgctga 
tgatggggcc 
tgatgcagaa 
tgtacagtgt 
catcagagcc 
ctcgagactt 
agatgtgggt 
cccttcagct 
gctcccggca 
atgactgtgt 
ctccatgtgg 
ccaagtttct 
tgctgggcct 



gggcctcagt 
gcaattcaag 
ggaggccact 
ccttggtttg 
tgccttgctc 
ggtcaccatg 
ctactgcaac 
agagcttgcc 
tagtgccagc 
gcccagtgac 
ctgggtggct 
tggtctggcc 
cactagtggc 
agtacaggtg 
catccttcat 
cctggtcatg 
cggtgcccta 
cccaacattc 
acgctgttca 
cctatcagct 
ggctcaggcc 
tgttcaaccc 
gacactgcag 
gtggcagagc 
gcagcactcg 
gtgcaaagat 
ggactgcaag 
caaggatcag 
ggcttggggg 
gacactggct 



ctggctgctt 
gcacaagggg 
ctcaaccaga 
ttcctggcca 
cctgggctgc 
aagcccagcc 
tacacacagt 
ctcattacag 
atggatcggc 
cgggtgcagc 
gccttaggta 
aactcacgag 
caacaattgg 
gtggtgctgt 
gacctctcac 
acacttccca 
ctgcctgaat 
tgtgcctccc 
caatgtgact 
gggcagttgc 
cttcacaaca 
tggcagctcc 
tttgatgcca 
cctacacctg 
aaaatgtatt 
ggccaggtgc 
gcagggagct 
tggtccccag 
gagccagctg 
gccctggggc 



tcctggagct 
actatatatt 
gaacacagcc 
tggctatgaa 
gactgggcta 
tcatgttcat 
accaaccccg 
gcaagttctt 
taagtgaccg 
tgcaggccgt 
gtgatgatga 
gtatctgcat 
gcaaggtggt 
ttgcatctgc 
ccaaggtatg 
atattgcccg 
tttcccatta 
tgaaagctga 
acatcatgct 
accaccaaat 
ccctgcagtg 
tggagaacat 
aagggagtgt 
tactacatac 
ggccaggcaa 
gcagagtaaa 
accggaagca 
aaaaaagcac 
tgctgtcact 
tctttgtcca 



tgggatgggg 
gggtggacta 
caacggcatc 
gatggctgta 
tgacctgttt 
ggccaaggtg 
tgtgctggct 
cagcttcttc 
ggaaacattt 
tgtgacactg 
ctatggccgg 
tgcacacgag 
ggatgtgcta 
ccgtgctgtc 
ggtggccagt 
tgtgggcact 
tgtggagact 
gttggatctg 
acagaacctg 
atttgcaacc 
caatgtctca 
gtacaatatg 
agacatggaa 
tgtaggcacc 
ccaggtgcca 
gggctttcat 
tccagatgac 
aacctgctta 
tctcctgctg 
ctactgggac 



60 

120 

180 

240 

3 00 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 



on 



no 



11 



agccctcttg 
ctcttctgcc 
caacaaccaa 
gccgagatct 
cttcggggcc 
tgtgcctggt 
acggaggtac 
accaatgcag 
ggtcgctata 
gtctcttttg 
ggtgctatct 
gtacttctgt 
gaagcatcag 



ttcaggcctc 
tcagtgtcct 
tggctcacct 
ttgtggagtc 
cctgggcttg 
acttgatggc 
tggaacactg 
tgttagcttt 
accgtgcccg 
tgcccctcct 
tattctgtgc 
ggctgccaga 
atgggaatag 



aggtgggtca 
tctgttccca 
ccctctcaca 
tgagctgcca 
gctggtggta 
tttccctcca 
ccgcatgcgt 
cctctgcttt 
tggcctcacc 
ggctaatgtg 
cctgggcatc 
gctcaacacc 
tggtagtagt 



ctgttctgct 
ggacgaccac 
ggctgcctga 

ct 9 a 9 tt: 999 
ctgctggcca 
gaggtggtga 
tcctgggtca 
ctgggcactt 
ttcgccatgc 
caggtggcct 
ctggccacct 
caggagttct 
gaggcaactc 



ttggcctgat 
gctctgccag 
gcacactctt 
caaactggct 
ctcttgtgga 
cagattggca 
gcctgggctt 
tcctggtaca 
tagcttattt 
accagccagc 
tccacctgcc 
tcctgggaag 
ggggacacag 



ctgcctaggc 
ctgccttgcc 
cctgcaagca 
ctgcagctac 
ggctgcacta 
ggtgctgccc 
ggtgcacatc 
gagccagcct 
catcatctgg 
tgtgcagatg 
caaatgctat 
gagccccaag 
tgaatga 



1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2577 



<210> 14 

<211> 858 

<212> PRT 

<213> Rattus sp. 

<400> 14 

Met Pro Gly Leu Ala lie Leu Gly Leu Ser Leu Ala Ala Phe Leu Glu 
15 10 15 

Leu Gly Met Gly Ser Ser Leu Cys Leu Ser Gin Gin Phe Lys Ala Gin 
20 25 30 

Gly Asp Tyr lie Leu Gly Gly Leu Phe Pro Leu Gly Thr Thr Glu Glu 
35 40 45 

Ala Thr Leu Asn Gin Arg Thr Gin Pro Asn Gly lie Leu Cys Thr Arg 
50 55 60 

Phe Ser Pro Leu Gly Leu Phe Leu Ala Met Ala Met Lys Met Ala Val 
65 70 75 80 

Glu Glu lie Asn Asn Gly Ser Ala Leu Leu Pro Gly Leu Arg Leu Gly 
85 90 95 

Tyr Asp Leu Phe Asp Thr Cys Ser Glu Pro Val Val Thr Met Lys Pro 
100 105 110 

Ser Leu Met Phe Met Ala Lys Val Gly Ser Gin Ser lie Ala Ala Tyr 
115 120 125 

Cys Asn Tyr Thr Gin Tyr Gin Pro Arg Val Leu Ala Val lie Gly Pro 
130 135 140 

His Ser Ser Glu Leu Ala Leu lie Thr Gly Lys Phe Phe Ser Phe Phe 
145 150 155 160 



Leu Met Pro Gin Val Ser Tyr Ser Ala Ser Met Asp Arg Leu Ser Asp 
165 170 175 



Arg Glu Thr Phe Pro Ser Phe Phe Arg Thr Val Pro Ser Asp Arg Val 
180 185 190 



oo 



oo 



12 



Gin Leu Gin Ala Val Val Thr Leu Leu Gin Asn Phe Ser Trp Asn Trp 
195 200 205 

Val Ala Ala Leu Gly Ser Asp Asp Asp Tyr Gly Arg Glu Gly Leu Ser 
210 215 220 

lie Phe Ser Gly Leu Ala Asn Ser Arg Gly lie Cys lie Ala His Glu 
225 230 235 240 

Gly Leu Val Pro Gin His Asp Thr Ser Gly Gin Gin Leu Gly Lys Val 
245 250 255 

Val Asp Val Leu Arg Gin Val Asn Gin Ser Lys Val Gin Val Val Val 
260 265 270 

Leu Phe Ala Ser Ala Arg Ala Val Tyr Ser Leu Phe Ser Tyr Ser lie 
275 280 285 

Leu His Asp Leu Ser Pro Lys Val Trp Val Ala Ser Glu Ser Trp Leu 
290 295 300 

Thr Ser Asp Leu Val Met Thr Leu Pro Asn lie Ala Arg Val Gly Thr 
305 310 315 320 

Val Leu Gly Phe Leu Gin Arg Gly Ala Leu Leu Pro Glu Phe Ser His 
325 330 335 

Tyr Val Glu Thr Arg Leu Ala Leu Ala Ala Asp Pro Thr Phe Cys Ala 
340 345 350 

Ser Leu Lys Ala Glu Leu Asp Leu Glu Glu Arg Val Met Gly Pro Arg 
355 360 365 

Cys Ser Gin Cys Asp Tyr lie Met Leu Gin Asn Leu Ser Ser Gly Leu 
370 375 380 

Met Gin Asn Leu Ser Ala Gly Gin Leu His His Gin lie Phe Ala Thr 
385 390 395 400 

Tyr Ala Ala Val Tyr Ser Val Ala Gin Ala Leu His Asn Thr Leu Gin 
405 410 415 

Cys Asn Val Ser His Cys His Thr Ser Glu Pro Val Gin Pro Trp Gin 
420 425 430 

Leu Leu Glu Asn Met Tyr Asn Met Ser Phe Arg Ala Arg Asp Leu Thr 
435 440 445 

Leu Gin Phe Asp Ala Lys Gly Ser Val Asp Met Glu Tyr Asp Leu Lys 
450 455 460 

Met Trp Val Trp Gin Ser Pro Thr Pro Val Leu His Thr Val Gly Thr 
465 470 475 480 

Phe Asn Gly Thr Leu Gin Leu Gin His Ser Lys Met Tyr Trp Pro Gly 



485 



490 



495 



oo oo 



13 

Asn Gin Val Pro Val Ser Gin Cys Ser Arg Gin Cys Lys Asp Gly Gin 
500 505 510 

Val Arg Arg Val Lys Gly Phe His Ser Cys Cys Tyr Asp Cys Val Asp 
515 520 " " 525 

Cys Lys Ala Gly Ser Tyr Arg Lys His Pro Asp Asp Phe Thr Cys Thr 
530 535 540 

Pro Cys Gly Lys Asp Gin Trp Ser Pro Glu Lys Ser Thr Thr Cys Leu 
545 550 555 560 

Pro Arg Arg Pro Lys Phe Leu Ala Trp Gly Glu Pro Ala Val Leu Ser 
565 570 575 

Leu Leu Leu Leu Leu Cys Leu Val Leu Gly Leu Thr Leu Ala Ala Leu 
580 585 590 

Gly Leu Phe Val His Tyr Trp Asp Ser Pro Leu Val Gin Ala Ser Gly 
595 600 605 

Gly Ser Leu Phe Cys Phe Gly Leu lie Cys Leu Gly Leu Phe Cys Leu 
610 615 620 

Ser Val Leu Leu Phe Pro Gly Arg Pro Arg Ser Ala Ser Cys Leu Ala 
625 630 635 640 

Gin Gin Pro Met Ala His Leu Pro Leu Thr Gly Cys Leu Ser Thr Leu 
645 650 655 

Phe Leu Gin Ala Ala Glu lie Phe Val Glu Ser Glu Leu Pro Leu Ser 
660 665 670 

Trp Ala Asn Trp Leu Cys Ser Tyr Leu Arg Gly Pro Trp Ala Trp Leu 
675 680 685 

Val Val Leu Leu Ala Thr Leu Val Glu Ala Ala Leu Cys Ala Trp Tyr 
690 695 700 

Leu Met Ala Phe Pro Pro Glu Val Val Thr Asp Trp Gin Val Leu Pro 
705 710 715 720 

Thr Glu Val Leu Glu His Cys Arg Met Arg Ser Trp Val Ser Leu Gly 
725 730 735 

Leu Val His lie Thr Asn Ala Val Leu Ala Phe Leu Cys Phe Leu Gly 
740 745 750 

Thr Phe Leu Val Gin Ser Gin Pro Gly Arg Tyr Asn Arg Ala Arg Gly 
755 760 . ~ ~ 

Leu Thr Phe Ala Met Leu Ala Tyr Phe lie He Trp Val Ser Phe Val 
770 775 780 



Pro Leu Leu Ala Asn Val Gin Val Ala Tyr Gin Pro Ala Val Gin Met 
785 790 795 800 



oo oo 



14 

Gly Ala lie Leu Phe Cys Ala Leu Gly lie Leu Ala Thr Phe His Leu 
805 810 815 

Pro Lys Cys Tyr Val Leu Leu Trp Leu Pro Glu Leu Asn Thr Gin Glu 

820 825 830 

Phe Phe Leu Gly Arg Ser Pro Lys Glu Ala Ser Asp Gly Asn Ser Gly 
835 840 845 

Ser Ser Glu Ala Thr Arg Gly His Ser Glu 
850 855 



<210> 15 
<211> 8194 
<212> DNA 

<213> Homo sapiens 
<220> 

<221> modif ied_base 
<222> (1251) . . (1300) 

<223> a, c, t, g, other or unknown 
<22.0> 

<221> modified base 

<222> (1951) . . (2000) 

<223> a, c, t, g, other or unknown 



<400> 15 

gagaatctcg 

gcctccgagc 

ccgatctggt 

agccggccgg 

aaacaccggg 

aacatgtcta 

gtaacaaggc 

tggggcaggg 

aaagttctga 

aaatgccaga 

ccgtccagag 

agttcctgag 

gggctccagt 

tatttaagca 

gccagcatgc 

tgggcctttg 

ctcctggcag 

gtgaccctgt 

ctatagggcc 

gaactgtccc 

ctagacactt 

nnnnnnnnnn 

tcactttctc 

cttcaggacc 

gagcttgaga 

tccctttgct 

ttctcagctg 

ccacctcttc 

gcccaacatc 



cgagatcccg 
cgccggcgcc 
cgaggggctc 
agagagaaag 
atattttttt 
tttgcatacc 
gaaagtatat 
gggtgtcgac 
aacctcgcaa 
gctccttttc 
gaagggtcac 
tgggaccgca 
cccacccctt 
actggcctcc 
tgctctgcac 
cctgccatag 
gcctgttccc 
gtgacaggtg 
cctctggctg 
caggccttgt 
cggccagttt 
nnnnnnnnnn 
tctctctctg 
ttttcgatgc 
gcccttgttg 
cccaagcctc 
tctcttactg 
caggctatgc 
accctggggt 



tcggtccgcc 
ctctgccggc 
cacggaggac 
ccagaaacct 
tctcctgcag 
ttcggtttgc 
gacaatttgc 
tcaaagctgt 
cacccggaga 
taagccaggt 
tgggtgccac 
ggcccggaat 
ttgggggcct 
ttagaggcca 
ggctcgcctg 
cacggagtct 
tctccattct 
agtgaggggc 
ccatcctcca 
tcatcaatcc 
ccaattattt 
nnnnnnnnnn 
gaaaacactg 
taataagttt 
aagttgtggt 
agagtctagg 
gctttctcca 
ggcttggggt 
accagctgta 



ccgctgccct 
aacctccgga 
tccatttacg 
cgcgaccagc 
aaaaagcttt 
atgcatttgt 
tcagaatctt 
gtctcattta 
aattgtgttc 
gaagtcacag 
ctggtttgca 
gtcaaggcaa 
gaagttagga 
ctccttggcc 
gtcggcctgc 
tctcctgact 
ggctgtctgc 
cagcagagcc 
aacaggacct 
acttgccacc 
cacccttgct 
nnnnnnnnnn 
actaatgtag 
ctccatcagg 
ttgggggact 
aggccagagg 
caggtcttgt 
tgaggagata 
tgatgtgtgt 



cccagctgcc 
agcacactag 
ttacgcaaat 
catgggccac 
aggattggca 
ttcgaagtga 
aatgtcagaa 
gtaaactgag 
cagcctccca 
agcgtggaca 
tctgtgcctt 
acagtcctgc 
agcatccggc 
atgccaggcg 
agcttctcat 
tcaccctccc 
aggtgaggca 
acacttagtg 
tgcctctgcc 
taagtgctgg 
gttagaatgt 
aattccttaa 
caggtttctc 
gccagcttgt 
ggaccgatga 
gtctcagcag 
agcttcaatg 
aacaactcca 
tctgactctg 



gaaaagaggg 
gaggttccag 
tccctacccc 
ctctccggaa 
gtttaaacaa 
gcaaccctgg 
aactggagac 
gcccaggtaa 
cctcgcccca 
gaacccacaa 
cgtcctgccc 
ttcagccact 
agctgccttc 
cgggcatctg 
ttcctgctgc 
cggagattac 
cagacccgag 
ggacccctgg 
tttgcccctt 
ctagaccttc 
nnnnnnnnnn 
actaaatttc 
tgctccagga 
tcctcctact 
cctcaaaggt 
gcctttgtcc 
agcatggcta 
cggccctgct 
ccaatgtgta 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 



oo 



oo 



15 



tgccacgctg 

tctccactat 

caccacagcc 

tttgcccatc 

nnnnnnnnnn 

acggggtttc 

ctcggcctcc 

taatataata 

tgttttccta 

gacattagat 

gggttcaagc 

taaatacaga 

tcctaacagg 

caaactgcct ■ 

atgcaggttt 

tcccacccct 

caggctgagg 

gccaggcact 

ttagctatgc 

gcaccatccc 

ggtggacctg 

cactggagaa 

tctctgccca 

gggccaccgt 

tggtgctgac 

ggcacatcac 

agaagagggc 

aggcccctag 

gccaagcttt 

acaacgcata 

cctctggagc 

cacctcctgt 

ctctaaatgc 

gttttttgag 

ctctgcaact 

gggattacag 

agatagagtc 

gagctccgcc 

acgggcgccc 

caccatgtta 

ccaaagtgct 

tagagatggg 

ctcctgcttc 

gatctttctc 

aagatccagg 

ttggtgggga 

gaaaccacca 

tctgtgctgt 

caaggtgcat 

cagtagctat 

cggttcctcc 

cggaaaggac 

acctagagcc 

gtccagctgc 

gagtgtgcag 

gccctgaggg 

cttgggcccc 

gcgactgtct 



agagtgctct 
tcccctacgg 
gccctgctga 
tcccttcagg 
nnnnnnnnnn 
accgtgttag 
caatgtgctg 
aaataattat 
caactagatg 
tctcataagt 
tcctacaaga 
tgaagcttcg 
ccactgacct 
ccagtggaag 
tgtctccttt 
cccccagaac 

ggtgctctcc 

gggggggCCt 

ggccagcagc 
caatgacaag 
gatctctctg 
ccaggccact 
ggtgggcgat 
cgtggttgtt 
caacctgact 
tggggtgccc 
tgtccctggc 
gccttgccac 
catggcacac 

ccgggctgtg 

ttgttccagg 
cagggagaac 
caagggggat 
acagtctggc 
tccacctcct 
gcacccacca 
tcgctctgtt 
tcccaggttc 
gccaccacgc 
gccaggatgg 
gggattacag 
gtttcaccat 
ggcctcccaa 
tctgatcctt 
gctaaaactg 
agattgaggg 
ggacggaaac 
ctgtggtggc 
ttccttctac 
aacataattg 
acatggtctc 
aaccaggtaa 
tgggggtgat 
caccactcta 
atgccctggg 
cagatgcaca 
tacgtgtggc 
tgaagggcac 



ccctgccagg 
tgctggcagt 
gccctttcct 
caagtctggg 
gccaccatgc 
ccaggctggt 
ggattacagg 
acaactcacc 
gtcccatctg 
agcgtgcaac 
atctgatgct 
cttactcacc 
aacttctgcc 
tccctgaagg 
gcttggaatg 
ctgccccagt 
tggtctcccc 
tcagtggaga 
gagacgctca 
taccaggtgg 
gttggcagca 
ggtcagggga 
gagaggatgc 
ttttccagcc 
ggcaaggtgt 
gggatccagc 
ctgaaggcgt 
aagggctcct 
acgatgccca 
tatgcggtgg 
ggccgagtct 
agccaatcct 
aaatgccact 
tctgtcaccc 
gggttcaagt 
ccatgcctgg 
gcccaggctg 
actccattcc 
ccagctaatt 
tctcaatctc 
gcgtgagcca 
gttggccagg 
agtgctggga 
gccttctctc 
tctgtaaagg 
gcttcctaag 
ccaggaaggc 
ttcatgatac 
acaaggacac 
cctgggactg 
cagttcagct 
tggggatgtg 
gctgacacag 
cccatcctgg 
gcggaagttc 
gagattctgt 
ccctctggct 
cagcgagtgg 



gcaacaccac 
gattgggcct 
ggtgcccatg 
nnnnnnnnnn 
ccggctaatt 
cgcaaactcc 
tgtgagccac 
ataatgtaga 
ggggtgatgg 
ccagatccct 
gctgctgatc 
agctgctcac 
ctgacctaca 
tccccaaaca 
catcccctca 
ggagccttcg 
ggctccctgt 
ctgaaatggc 
gcgtgaagcg 
agaccatggt 
gtgacgacta 
tctgcattgc 
agtgcctcat 
ggcagttggc 
gggtcgcctc 
gcattgggat 
ttgaagaagc 
ggtgcagcag 
agctcaaagc 
cccatggcct 
acccctggca 
gagatgagca 
aacttgaggt 
aggctgcagt 
gattctcttg 
ataatttttc 
gaatgcagtg 
cctgcctcag 
ttttttgtat 
ctgaccttgt 
ccgcacccgg 
ctggtctcga 
ttacaggcat 
acccactgtg 
agtgtttgtt 
aaggaaggga 
cccaggccct 
gcgtttcttt 
tgtggcgttt 
gaatggaccc 
aaacataaat 
gctactcacc 
tgtacaggga 
ccagggaagc 
acacgaccag 
tttctgttcc 
tcttacaggt 
ttacgggttt 



atagagctcc 
gacagcacca 
gtaagctgga 
nnnnnnnnnn 
tttttgtatt 
taacctcgtg 
tgcacccggc 
atcagtggga 
gagacagtga 
cgcatgtgca 
tgacaggagg 
ctcctcctgt 
catgcttctc 
cacgggacta 
ccccttgtcc 
caggtgattt 
atccccacac 
tgaacgggac 
gcagtatccc 
gctgctgctg 
tgggcagcta 
tttcaaggac 
gcgccacctg 
cagggtgttt 
agaagcctgg 
ggtgctgggc 
ctatgcccgg 
caatcagctc 
cttctccatg 
ccaccagctc 
ggtaagagag 
gagtgggcac 
tttttgtttt 
gtagtgatgc 
cctcggcctc 
ttttcttttt 
gtgcgatctt 
cctcccaagt 
tttgagtaga 
catccgccca 
cctaattttt 
actcctggca 
tagctctctt 
tcttggaagt 
agaggcctcc 
cgagaccttc 
tgcttctggg 
cagcttttgg 
aatgacaaca 
aagtggacct 
gagaccaaaa 
atgtaactgg 
gcaggagggg 
agggaagaca 
gggccctgcc 
acatgtgagc 
gcctaagtct 
ccatcactgc 



aaggagacct 
accgtgctgc 
gcctcagacc 
nnnnnnnnnn 
tttagtagag 
atccacccac 
cataatgtat 
gccctgagct 
cagatcatca 
gttcacagta 
ggagcagctg 
gaggcccggt 
ttcttccttg 
tttcactcct 
ccaggcagat 
gtcagtttca 
ccagcacagg 
ctcccataga 
tctttcctgc 
cagaagttcg 

ggggtgcagg 

atcatgccct 
gcccaggccg 
ttcgagtccg 
gccctctcca 
gtggccatcc 
gcagacaaga 
tgcagagaat 
agttctgcct 
ctgggctgtg 
cccaccccag 
tctccggtca 
gttttgtttt 
gatctcggct 
ctgagtagct 
tttttttttg 
ggctcactgt 
aggtgggact 
gacggggttt 
cctcgtcctc 
gtatttttag 
tcaagtgatc 
ctcttagaca 
gtcaagtgat 
tctcaggagg 
ctgatgggct 
accatgtggg 
agcagatcca 
gagatcccct 
tcacggtcct 
tccagtggca 
cttatgggca 
ggccccaggg 
ctccgtaggc 
ctgggagtga 
tgtcctttga 
gtgtgttcca 
tgctttgagt 



1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 
3900 
3960 
4020 
4080 
4140 
4200 
4260 
4320 
4380 
4440 
4500 
4560 
4620 
4680 
4740 
4800 
4860 
4920 
4980 
5040 
5100 
5160 
5220 



oo 



gtgtgccctg tggggctggg accttcctca 
cgagctaccc agcactcccg ggggctgcac 
gtgccctgcc ccagaaccaa ggcccagtca 
acacctgcta ccagacagaa ttctgatcaa 
gcctgtaatc ccagcacttt gggaggctga 
gagaccagcc tggccaacat ggtgaaaccc 
gggtgtggtg gcgcgtgcct gtaatcccag 
ttgaacccag gaggcggagg ttgcagtgag 
cgagaattcg tccccccaaa aaaagaaagg 
cccagcactt tgggaggccg aggtgggtgg 
ctgaccaaca tggtgaaacc ccatctctac 
gtggcgtgtg cctgtaattc cagctactcg 
cgggaggcgg aggttgcagt gagccaagat 
gagaaaaact ctgtctcaaa aaaaaagaaa 
agactgaggt gtgtcctctg ttagagagct 
tcctgaattc aacctctttc tctaaatgaa 
tcctactgtc ccttctgttg cccatgccaa 
gaatacagat actagcgtgt ctgcagcaga 
caaggtcaag aacagagagc aaattaggta 
a 9999ccaca ttctttcctt tcaccatctc 
tcagagggtc aggactcaga gaaaccacag 
atgctggcaa gagagagggg ttacaatgcc 
tcgtaacctc tctggtatgt gggcagagct 
aaaccctcat gggatcatga gccatacaga 
taacacaggc attttgagga aatgcgtggc 
cactatgcct agtatagtct agctgccctg 
tatttcctat tcctactctg ctcatctggc 
gacctctaca gatgccagcc ttgtgggaaa 
tgcttcccgc gcactgtggt gtttttggct 
gcagctaaca cgctgctgct gctgctgctg 
ctagacaccc ctgtggtgag gtcagcaggg 
ctggcagcag gtagtggcag cctctatggc 
ttgctacgcc aggccctctt tgcccttggt 
cgctcattcc aactaatcat catcttcaag 
gcctgggtcc aaaaccacgg tgctggcctg 
cttatctgtc taacttggct ggtggtgtgg 
ttcccccatc tggtgatgct tgagtgcaca 
ttcctctaca atggcctcct ctccatcagt 
ttgccagaga actacaacga ggccaaatgt 
tcctggatcg ccttcttcac cacggccagc 
aacatgatgg ctgggctgag cagcctgagc 
tgctacgtga tcctctgccg cccagacctc 
caggactaca cgaggcgctg cggctccacc 
gccttctctg ccctgagggt cgaaggtcga 
gcatcgcggt ctggggttgg gacgtgtaag 
ctgccaataa agaagtgaaa tgcgtatctg 
acggattcaa gtctgaaccc agagcctgga 
ggcaactccg gaggcgggcc cagcgccaaa 
cattggccgt tctctgcggg gccccgccct 
cgaggcgcac ctcctggcct gcacgctttg 



<210> 16 

<211> 2526 

<212> DNA 

<213> Homo sapiens 



no 



16 

acaagagtgg tgagtgggca atggagcagg 52 80 
ggtggaggga gggcctccct tgggccccat 5340 
ctgggctgcc agttagcttc aggttggagg 5400 
gagaatcagc cactgggtgc ggtggctcat 5460 
ggcgggtgga tcacttgagg tcgggagttc 5520 
catctctacc aaaaatataa aaaattagct 5580 
ctactcggga ggctgaggca ggagaatcac 5640 
ccaagatgca ttccagcctg gaccacaaag 5700 
aggccgggcg cggtggctca cacctgtaat 5760 
atcacctgag gtcaggagtt cgagaccagc 5820 
taaaaataca aaaaaagtta gccgggcgtt 5880 
ggaggctgag gcaggagaat tgcttgaacc 5940 
tgcaccattg cactccagcc tgggcgacaa 6000 
gaaagaaaga attagccaac tgaaagcctt 6060 
gtcatcacaa ctcctacaaa agcagtcgta 6120 
tatagctatt gttccctttg tgccctcttg 6180 
agacagctag ctccttgaac agcttggcct 6240 
gaaaaaaaca gcattcccca tccagaaatg 6300 
gctaaggact caggtcctta gttggtgtcc 6360 
tgtagggaca ggaatacttc ccttctgtcc 6420 
agcagcagct caggaaagtg gttcatggaa 64 80 
ctcccttggg agcaggctgc tcccatcaga 6540 
accaggttaa ggtcctccct agggtttgca 6600 
accgacctgt gtgtctccag agtctgtaat 6660 
ctcaggcccc actcccggct acccccatcc 6720 
gtacaattct cccagtatct tgcaggcccc 6780 
tctcaggaac cttcttggcc ttccctttca 6840 
gaagagtggg cacctgaggg aagccagacc 6900 
ttgcgtgagc acacctcttg ggtgctgctg 6960 
cttgggactg ctggcctgtt tgcctggcac 7 02 0 
ggccgcctgt gctttcttat gctgggctcc 7080 
ttctttgggg aacccacaag gcctgcgtgc 7140 
ttcaccatct tcctgtcctg cctgacagtt 7200 
ttttccacca aggtacctac attctaccac 7260 
tttgtgatga tcagctcagc ggcccagctg 7320 
accccactgc ctgctaggga ataccagcgc 7380 
gagaccaact ccctgggctt catactggcc 7440 
gcctttgcct gcagctacct gggtaaggac 7500 
gtcaccttca gcctgctctt caacttcgtg 7560 
gtctacgacg gcaagtacct gcctgcggcc 7620 
agcggcttcg gtgggtattt tctgcctaag 7680 
aacagcacag agcacttcca ggcctccatt 7740 
tgaccagtgg gtcagcaggc acggctggca 7800 
gcaggccggg ggtgtccggg aggtctttgg 7860 
cgcctgggag agcctagacc aggctccggg 7920 
gtctcctgtc gtgggagagt gtgaggtgta 7980 
aaaggctgac cgcccagatt gacgttgcta 8040 
agaacagggc gaggcgtcgt ccccgcatcc 8100 
cgggggccgg agctagaagc tctacgcttc 8160 
acgt 8194 



GO 



OG 



17 



<400> 16 

atgctgctct 

tttgcctgcc 

gcaggcctgt 

ctgtgtgaca 

cttggggttg 

cagctgtatg 

ctgccagggc 

ctggcagtga 

cctttcctgg 

cagtatccct 

ctgctgctgc 

gggcagctag 

ttcaaggaca 

cgccacctgg 

agggtgtttt 

gaagcctggg 

gtgctgggcg 

tatgcccggg 

aatcagctct 

ttctccatga 

caccagctcc 

cttttggagc 

gacaacagag 

tggaccttca 

accaaaatcc 

tgtcttgaag 

ccctgtgggg 

aaagaagagt 

gctttgcgtg 

ctgcttggga 

99999ccgcc 

ggcttctttg 

ggtttcacca 

aagttttcca 

ctgtttgtga 

tggaccccac 

acagagacca 

agtgcctttg 

tgtgtcacct 

agcgtctacg 

agcagcggct 

ctcaacagca 

acctga 



gcacggctcg 
atagcacgga 
tccctctcca 
ggtcttgtag 
aggagataaa 
atgtgtgttc 
aacaccacat 
ttgggcctga 
tgcccatgat 
ctttcctgcg 
agaagttcgg 
gggtgcaggc 
tcatgccctt 
cccaggccgg 
tcgagtccgt 
ccctctccag 
tggccatcca 
cagacaagaa 
gcagagaatg 
gttctgccta 
tgggctgtgc 
agatccacaa 
atcccctcag 
cggtcctcgg 
agtggcacgg 
ggcaccagcg 
ctgggacctt 
gggcacctga 
agcacacctc 
ctgctggcct 
tgtgctttct 
gggaacccac 
tcttcctgtc 
ccaaggtacc 
tgatcagctc 
tgcctgctag 
actccctggg 
cctgcagcta 
tcagcctgct 
acggcaagta 
tcggtgggta 
cagagcactt 



cctggtcggc 
gtcttctcct 
ttctggctgt 
cttcaatgag 
caactccacg 
tgactctgcc 
agagctccaa 
cagcaccaac 
tagctatgcg 
caccatcccc 
gtggacctgg 
actggagaac 
ctctgcccag 
ggccaccgtc 
ggtgctgacc 
gcacatcact 
gaagagggct 
ggcccctagg 
ccaagctttc 
caacgcatac 
ctctggagct 
ggtgcatttc 
tagctataac 
ttcctccaca 
aaaggacaac 
agtggttacg 
cctcaacaag 
gggaagccag 
ttgggtgctg 
gtttgcctgg 
tatgctgggc 
aaggcctgcg 
ctgcctgaca 
tacattctac 
agcggcccag 
ggaataccag 
cttcatactg 
cctgggtaag 
cttcaacttc 
cctgcctgcg 
ttttctgcct 
ccaggcctcc 



ctgcagcttc 
gacttcaccc 
ctgcaggtga 
catggctacc 
gccctgctgc 
aatgtgtatg 
ggagaccttc 
cgtgctgcca 
gccagcagcg 
aatgacaagt 
atctctctgg 
caggccactg 
gtgggcgatg 
gtggttgttt 
aacctgactg 
ggggtgcccg 
gtccctggcc 
ccttgccaca 
atggcacaca 
cgggctgtgt 
tgttccaggg 
cttctacaca 
ataattgcct 
tggtctccag 
caggtgccta 
ggtttccatc 
agtgacctct 
acctgcttcc 
ctggcagcta 
cacctagaca 
tccctggcag 
tgcttgctac 
gttcgctcat 
cacgcctggg 
ctgcttatct 
cgcttccccc 
gccttcctct 
gacttgccag 
gtgtcctgga 
gccaacatga 
aagtgctacg 
attcaggact 



tcatttcctg 
tccccggaga 
ggcacagacc 
acctcttcca 
ccaacatcac 
ccacgctgag 
tccactattc 
ccacagccgc 
agacgctcag 
accaggtgga 
ttggcagcag 
gtcaggggat 
agaggatgca 
tttccagccg 
gcaaggtgtg 
ggatccagcg 
tgaaggcgtt 
agggctcctg 
cgatgcccaa 
atgcggtggc 
gccgagtcta 
aggacactgt 
gggactggaa 
ttcagctaaa 
agtctgtgtg 
actgctgctt 
acagatgcca 
cgcgcactgt 
acacgctgct 
cccctgtggt 
caggtagtgg 
gccaggccct 
tccaactaat 
tccaaaacca 
gtctaacttg 
atctggtgat 
acaatggcct 
agaactacaa 
tcgccttctt 
tggctgggct 
tgatcctctg 
acacgaggcg 



ctgctgggcc 
ttacctcctg 
cgaggtgacc 
ggctatgcgg 
cctggggtac 
agtgctctcc 
ccctacggtg 
cctgctgagc 
cgtgaagcgg 
gaccatggtg 
tgacgactat 
ctgcattgct 
gtgcctcatg 
gcagttggcc 
ggtcgcctca 
cattgggatg 
tgaagaagcc 
gtgcagcagc 
gctcaaagcc 
ccatggcctc 
cccctggcag 
ggcgtttaat 
tggacccaag 
cataaatgag 
ttccagcgac 
tgagtgtgtg 
gccttgtggg 
ggtgtttttg 
gctgctgctg 
gaggtcagca 
cagcctctat 
ctttgccctt 
catcatcttc 
cggtgctggc 
gctggtggtg 
gcttgagtgc 
cctctccatc 
cgaggccaaa 
caccacggcc 
gagcagcctg 
ccgcccagac 
ctgcggctcc 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2526 



<210> 17 
<211> 841 
<212> PRT 

<213> Homo sapiens 



<400> 17 

Met Leu Leu Cys Thr Ala Arg Leu Val Gly Leu Gin Leu Leu lie Ser 
1 ' 5 10 15 



Cys Cys Trp Ala Phe Ala Cys His Ser Thr Glu Ser Ser Pro Asp Phe 
20 25 30 



oo oo 
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Thr Leu Pro Gly Asp Tyr Leu Leu Ala Gly Leu Phe Pro Leu His Ser 
35 40 45 

Gly Cys Leu Gin Val Arg His Arg Pro Glu Val Thr Leu Cys Asp Arg 
50 55 60 

Ser Cys Ser Phe Asn Glu His Gly Tyr His Leu Phe Gin Ala Met Arg 
65 70 75 80 

Leu Gly Val Glu Glu lie Asn Asn Ser Thr Ala Leu Leu Pro Asn lie 
85 90 95 

Thr Leu Gly Tyr Gin Leu Tyr Asp Val Cys Ser Asp Ser Ala Asn Val 
100 105 110 

Tyr Ala Thr Leu Arg Val Leu Ser Leu Pro Gly Gin His His lie Glu 
115 120 125 

Leu Gin Gly Asp Leu Leu His Tyr Ser Pro Thr Val Leu Ala Val lie 
130 135 140 

Gly Pro Asp Ser Thr Asn Arg Ala Ala Thr Thr Ala Ala Leu Leu Ser 
145 150 155 160 

Pro Phe Leu Val Pro Met lie Ser Tyr Ala Ala Ser Ser Glu Thr Leu 
165 170 175 

Ser Val Lys Arg Gin Tyr Pro Ser Phe Leu Arg Thr lie Pro Asn Asp 
180 185 190 

Lys Tyr Gin Val Glu Thr Met Val Leu Leu Leu Gin Lys Phe Gly Trp 
195 200 205 

Thr Trp lie Ser Leu Val Gly Ser Ser Asp Asp Tyr Gly Gin Leu Gly 
210 215 220 

Val Gin Ala Leu Glu Asn Gin Ala Thr Gly Gin Gly lie Cys He Ala 
225 230 235 240 

Phe Lys Asp He Met Pro Phe Ser Ala Gin Val Gly Asp Glu Arg Met 
245 250 255 

Gin Cys Leu Met Arg His Leu Ala Gin Ala Gly Ala Thr Val Val Val 
260 265 270 

Val Phe Ser Ser Arg Gin Leu Ala Arg Val Phe Phe Glu Ser Val Val 
275 280 285 

Leu Thr Asn Leu Thr Gly Lys Val Trp Val Ala Ser Glu Ala Trp Ala 
290 295 300 

Leu Ser Arg His He Thr Gly Val Pro Gly He Gin Arg He Gly Met 
305 310 315 320 



Val Leu Gly Val Ala He Gin Lys Arg Ala Val Pro Gly Leu Lys Ala 
325 330 335 



no no 
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Phe Glu Glu Ala Tyr Ala Arg Ala Asp Lys Lys Ala Pro Arg Pro Cys 
340 345 350 

His Lys Gly Ser Trp Cys Ser Ser Asn Gin Leu Cys Arg Glu Cys Gin 
355 360 365 

Ala Phe Met Ala His Thr Met Pro Lys Leu Lys Ala Phe Ser Met Ser 
370 375 380 

Ser Ala Tyr Asn Ala Tyr Arg Ala Val Tyr Ala Val Ala His Gly Leu 
385 390 395 400 

His Gin Leu Leu Gly Cys Ala Ser Gly Ala Cys Ser Arg Gly Arg Val 
405 410 415 

Tyr Pro Trp Gin Leu Leu Glu Gin lie His Lys Val His Phe Leu Leu 
420 425 430 

His Lys Asp Thr Val Ala Phe Asn Asp Asn Arg Asp Pro Leu Ser Ser 
435 440 445 

Tyr Asn lie lie Ala Trp Asp Trp Asn Gly Pro Lys Trp Thr Phe Thr 
450 455 460 

Val Leu Gly Ser Ser Thr Trp Ser Pro Val Gin Leu Asn lie Asn Glu 
465 470 475 480 

Thr Lys lie Gin Trp His Gly Lys Asp Asn Gin Val Pro Lys Ser Val 
485 490 495 

Cys Ser Ser Asp Cys Leu Glu Gly His Gin Arg Val Val Thr Gly Phe 
500 505 510 

His His Cys Cys Phe Glu Cys Val Pro Cys Gly Ala Gly Thr Phe Leu 
515 520 525 

Asn Lys Ser Asp Leu Tyr Arg Cys Gin Pro Cys Gly Lys Glu Glu Trp 
530 535 540 

Ala Pro Glu Gly Ser Gin Thr Cys Phe Pro Arg Thr Val Val Phe Leu 
545 550 555 560 

Ala Leu Arg Glu His Thr Ser Trp Val Leu Leu Ala Ala Asn Thr Leu 
565 570 575 

Leu Leu Leu Leu Leu Leu Gly Thr Ala Gly Leu Phe Ala Trp His Leu 
580 585 590 

Asp Thr Pro Val Val Arg Ser Ala Gly Gly Arg Leu Cys Phe Leu Met 
595 600 605 

Leu Gly Ser Leu Ala Ala Gly Ser Gly Ser Leu Tyr Gly Phe Phe Gly 
610 615 620 

Glu Pro Thr Arg Pro Ala Cys Leu Leu Arg Gin Ala Leu Phe Ala Leu 
625 630 635 640 



oo oo 
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Gly Phe Thr lie Phe Leu Ser Cys Leu Thr Val Arg Ser Phe Gin Leu 
645 650 655 

lie lie lie Phe Lys Phe Ser Thr Lys Val Pro Thr Phe Tyr His Ala 
660 665 670 

Trp Val Gin Asn His Gly Ala Gly Leu Phe Val Met lie Ser Ser Ala 
675 680 685 

Ala Gin Leu Leu lie Cys Leu Thr Trp Leu Val Val Trp Thr Pro Leu 
690 695 700 

Pro Ala Arg Glu Tyr Gin Arg Phe Pro His Leu Val Met Leu Glu Cys 
705 710 715 720 

Thr Glu Thr Asn Ser Leu Gly Phe lie Leu Ala Phe Leu Tyr Asn Gly 
725 730 735 

Leu Leu Ser lie Ser Ala Phe Ala Cys Ser Tyr Leu Gly Lys Asp Leu 
740 745 750 

Pro Glu Asn Tyr Asn Glu Ala Lys Cys Val Thr Phe Ser Leu Leu Phe 
755 760 765 

Asn Phe Val Ser Trp lie Ala Phe Phe Thr Thr Ala Ser Val Tyr Asp 
770 775 780 

Gly Lys Tyr Leu Pro Ala Ala Asn Met Met Ala Gly Leu Ser Ser Leu 
785 790 795 800 

Ser Ser Gly Phe Gly Gly Tyr Phe Leu Pro Lys Cys Tyr Val lie Leu 
805 810 815 

Cys Arg Pro Asp Leu Asn Ser Thr Glu His Phe Gin Ala Ser lie Gin 
820 825 * 830 

Asp Tyr Thr Arg Arg Cys Gly Ser Thr 
835 ^ 840 



<210> 18 
<211> 14 
<212> PRT 

<213> Artificial Sequence 
<220> 

<221> MOD_RES 

<222> (1) 

<22 3> Thr or Arg 

<220> 

<221> MOD_RES 

<222> (3) 

<22 3> Phe or Leu 

<220> 

<221> MOD RES 



GO 



no 
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<222> (4) 

<223> Arg, Gin or Pro 
<220> 

<2 21> MOD_RES 

<222> (6) 

<22 3> Arg or Thr 

<220> 

<2 21> MOD_RES 
<222> (7) 

<223> Ser, Pro or Val 
<220> 

<221> MOD_RES 
<222> (8) 

<223> Val, Glu, Arg, Lys or Thr 
<220> 

<221> MOD_RES 

<222> (11) 

<223> Ala or Glu 

<220> 

<221> MOD_RES 

<222> (12) 

<223> Trp or Leu 

<220> 

<221> MOD_RES 
<222> (13) 

<223> Arg, His or Gly 
<220> 

<223> Description of Artificial Sequence: Consensus 
sequence 

<400> 18 

Xaa Cys Xaa Xaa Arg Xaa Xaa Xaa Phe Leu Xaa Xaa Xaa Glu 
1 5 10 



<210> 19 

<211> 15 

<212> PRT 

<213> Artificial Sequence 
<220> 

<221> MOD_RES 

<222> (1) 

<223> Leu or Gin 

<220> 

<221> M0D_RES 

<222> (3) 

<223> Glu, Gly or Thr 



no 



GO 



<220> 

<221> MOD_RES 
<222> (4) 

<2 23> Asn, Arg or Cys 
<220> 

<2 21> MOD__RES 

<222> (7) 

<223> Arg or Glu 



MOD_RES 
(9) 

Arg or Lys 



<220> 
<221> 
<222> 
<223> 

<220> 
<221> 
<222> 
<223> 



MOD_RES 
(10) 

Cys , Gly 



or Phe 



<220> 

<221> MOD_RES 
<222> (11) 

<223> Val, Leu or lie 
<220> 

<2 21> MOD_RES 

<222> (13) 

<223> Phe or Leu 

<220> 

<221> MOD_RES 

<222> (14) 

<223> Ala or Asn 

<220> 

<221> MOD_RES 

<222> (15) 

<223> Met or Leu 



<220> 

<223> Description of Artificial Sequence: Consensus 
sequence 

<400> 19 

Xaa Pro Xaa Xaa Tyr Asn Xaa Ala Xaa Xaa Xaa Thr Xaa Xaa Xaa 
15 10 15 



<210> 20 

<211> 3563 

<212> DNA 

<213> Homo sapiens 



<400> 20 

agcctggcag tggcctcagg cagagtctga 
ggacaccact ggggccccag ggtgtggcaa 
tcctctgccc gctccccgcc ccgggctcac 



cgcgcacaaa ctttcaggcc caggaagcga 60 
gtgaggatgg caagggtttt gctaaacaaa 120 
tccatgtgag gccccagtcg gggcagccac 180 



GO 



OO 



23 



ctgccgtgcc 
ctctgggctc 
atgaaggggg 
ctccgcagcc 
tgggtcgggg 
ctgcggttct 
aaatggccgt 
acgacctctt 
tggccaaggc 
gtgtgctggc 
tcagcttctt 
cctgccccgt 
cctgggagcc 
ggagctgctg 
tgtgcagctg 
cctgggcagc 
ggcacgcggc 
gcggctgggg 
gctgctgttc 
gctctcgccc 
gctgcccggc 
gcacgagttc 
ctctgccctg 
gcagtgtgac 
ctctgtctac 
cgcctcaggc 
gggtgtgctg 
aggtggctgg 
gaccttccac 
gtacgacctg 
gttcaacggc 
ggtgaggtga 
ctgggggtgg 
caggcctgtg 
cgccgggtca 
taccggcaaa 
agggtcctgc 
gcgcccttct 
tccccggagc 
ccggctgtgc 
ttggggctgt 
gcctgctttg 
cagcccagcc 
tgcctgagca 
agctgggcag 
ctggccatgc 
gtggtgacgg 
tgggtcagct 
ggcactttcc 
gccatgctgg 
gtggtcctca 
gctgccttcc 
gagttcttcc 
aatcagggga 
gctgcgatcc 
aggttctgac 
acgtggacac 



tgttggaagt 
tcctgcaccc 
actacgtgct 
ggacacggcc 
tcagggtgac 
gtgtggcccc 
ggaggagatc 
tgatacgtgc 
aggcagccgc 
tgtcatcggg 
cctcatgccc 
gggagcccct 
ctgtgtcaga 
agcgcccggg 
acggccgccg 
gacgacgagt 
atctgcatcg 
aaggtgcagg 
gcctccgtgc 
aaggtgtggg 
atggcccaga 
ccccagtacg 
ggcgagaggg 
tgcatcacgc 
gcagctgtgt 
tgccccgcgc 
tcctctgcat 
cggctcagcc 
gtgggcgggc 
aagctgtggg 
agcctcagga 
gggtgggtgt 
gggccgttcc 
cgcagaagcc 
aggggttcca 
acccaggtga 
caagtcctga 
cctctctcac 
gaagcacacg 
tgctgctgct 
tcgttcacca 
gcctggtgtg 
ctgcccgatg 
cactcttcct 
accggctgag 
tggtggaggt 
actggcacat 
tcggcctagc 
tggtgcggag 
cctacttcat 
ggcccgccgt 
acctgcccag 
tgggaggggg 
aacatgagtg 
cccccaagcc 
cccaggttgt 
ccctgtgacc 



tgcctctgcc 
tgggacgggg 

gggggggctg 

cagcagccct 
caggtctggg 
aggttctcct 
aacaacaagt 
tcggagcctg 
gacatcgccg 
ccccactcgt 
cagtggggcg 
tgtgtcagga 
agatgctctt 
agaccttccc 
cggagctgct 
acggccggca 
cgcacgaggg 
acgtcctgca 
acgccgccca 
tggccagcga 
tgggcacggt 
tgaagacgca 
agcagggtct 
tgcagaacgt 
atagcgtggc 
aggaccccgt 
gtgcccaggc 
ccgtcccccg 
tgccgctgcg 
tgtggcaggg 
cagagcgcct 
gccaggcgtg 
agtctcccgt 
cgtgtcccgg 
ctcctgctgc 
gccgccttcc 
ctctgagacc 
agacgacatc 
ctgcttccgc 
cctgctgctg 
tcgggacagc 
cctgggcctg 
cctggcccag 
gcaggcggcc 
tggctgcctg 
cgcactgtgc 
gctgcccacg 
gcacgccacc 
ccagccgggc 
cacctgggtc 
gcagatgggc 
gtgttacctg 
ccctggggat 
acccaaccct 
agcaatgacc 
ctcctgaccc 
ate 



atgctgggcc 
gccccattgt 
ttccccctgg 
gtgtgcacca 
gtgctcctga 
caaacggcct 
eggatctget 
tggtggccat 
cctactgcaa 
cagagctcgc 
ccccccacca 
gaatgetaca 
ggccttgcag 
ctccttcttc 
gcaggagttc 
gggectgage 
cctggtgccg 
ccaggtgaac 
cgccctcttc 
ggcctggctg 
gcttggcttc 
cctggccctg 
ggaggaggac 
gagegcaggg 
ccaggccctg 
gaagccctgg 
caccaggcac 
cccgcagctc 
gttcgacagc 
ctcagtgccc 
gaagatcege 
cccgtggtag 
gggcatgccc 
tgctcgcggc 
tacgactgtg 
eggcaggegg 
agagcccaca 
gcctgcacct 
cgcaggtctc 
agcctggcgc 
ccactggttc 
gtctgcctca 
cagcccttgt 
gagatcttcg 
cgggggccct 
acctggtacc 
gaggegctgg 
aatgccacgc 
tgctacaacc 
tcctttgtgc 
gccctcctgc 
ctcatgcggc 
gcccaaggcc 
gtgatctcag 
cgtgtctcgc 
tgaccccaca 



ctgctgtcct 
gcctgtcaca 
gegaggcega 
ggtacagagg 
gctggggccg 
gctctgggca 
gcccgggctg 
gaagcccagc 
ctacacgcag 
catggtcacc 
tcacccaccc 
tgcaccccac 
gtcagctacg 
cgcaccgtgc 
ggctggaact 
atettctegg 
ctgccccgtg 
cagagcagcg 
aactacagca 
acctctgacc 
ctccagaggg 
gccaccgacc 
gtggtgggcc 
ctaaatcacc 
cacaacactc 
caggtgagee 
ggccaccacg 
ctggagaaca 
ageggaaacg 
aggctccacg 
tggcacacgt 
cccccgcggc 
agecgagcag 
agtgccagga 
tggactgega 
gggtgggaac 
gggtacaaga 
tttgtggcca 
ggttcctggc 
tgggccttgt 
aggecteggg 
gcgtcctcct 
cccacctccc 
tggagtcaga 
gggcctggct 
tggtggcctt 
tgcactgccg 
tggectttet 
gtgcccgtgg 
ccctcctggc 
tctgtgtcct 
agecaggget 
agaatgaegg 
ccccggtgaa 
tacagagacc 
gtgageccta 



gggcctcagc 
gcaacttagg 
ggaggctggc 
tgggaeggee 
aggtggccat 
ctggccatga 
cgcctgggct 
ctcatgttcc 
taccagcccc 
ggcaagttct 
ccaaccaacc 
ccagccctgc 
gtgetagcat 
ccagcgaccg 
gggtggccgc 
ccctggccgc 
ccgatgactc 
tgcaggtggt 
tcagcagcag 
tggtcatggg 
gtgcccagct 
cggccttctg 
agcgctgccc 
accagaegtt 
ttcagtgcaa 
egggagatgg 
cctgagctgg 
tgtacaacct 
tggacatgga 
acgtgggcag 
ctgacaacca 
agggegcage 
agccagaccc 
gggccaggtg 
ggegggcage 
gcagcagggg 
cgaacaccca 
ggatgagtgg 
atggggcgag 
getggctget 
ggggcccctg 
gttccctggc 
gctcacgggc 
actgcctctg 
ggtggtgctg 
cccgccggag 
cacacgctcc 
ctgcttcctg 
cctcaccttt 
caatgtgcag 
gggcatcctg 
caacaccccc 
gaacacagga 
cccagactta 
ctcccgctct 
ggcctggagc 



240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

234 0 

2400 

2460 

2520 

2580 

2640 

2700 

2760 

2820 

2880 

2940 

3000 

3060 

3120 

3180 

3240 

3300 

3360 

3420 

3480 

3540 

3563 



